@conference {plaisant_exploring_2006,
	title = {Exploring Erotics in Emily Dickinson{\textquoteright}s Correspondence with Text Mining and Visual Interfaces},
	booktitle = {Proceedings of the 6th ACM/IEEE-CS Joint Conference on Digital Libraries},
	series = {{JCDL} {\textquoteright}06},
	year = {2006},
	note = {00053},
	pages = {141{\textendash}150},
	publisher = {{ACM}},
	organization = {{ACM}},
	address = {New York, {NY}, {USA}},
	abstract = {This article examines how document repositories can be utilized for humanities research and critical interpretation. The article specifically focuses on the rapidly expanding field of text mining. A case study of 300 XML encoded letter written between Emily Dickinson and her sister-in-law Susan Huntingdon Dickinson was used by the authors to experiment with their methods and test their theories. The authors argue that in order for computational methods to significantly effect the humanities discipline the tools developed must be concerned with scholarly interpretation and be useable by non-experts. Using a multinomial na{\"\i}ve Bayes algorithm, the authors trained a computer program to "read" the Dickinson correspondence for erotic language and to then classify the letters based on the appearance (or not) of this language. The panel of literary scholars was particularly pleased by how accurately the algorithm classified the letters. Feedback was given for improving aesthetic qualities of the user interface but overall the tool proved both useful and useable. },
	keywords = {case studies, humanities, literary criticism, text mining, user interface, visualization},
	isbn = {1-59593-354-9},
	doi = {10.1145/1141753.1141781},
	url = {http://doi.acm.org/10.1145/1141753.1141781},
	author = {Plaisant, Catherine and Rose, James and Yu, Bei and Auvil, Loretta and Kirschenbaum, Matthew G. and Smith, Martha Nell and Clement, Tanya and Lord, Greg}
}
@article {clement_knowledge_2011,
	title = {Knowledge Representation and Digital Scholarly Editions in Theory and Practice},
	journal = {Journal of the Text Encoding Initiative},
	number = {Issue 1},
	year = {2011},
	note = {00007},
	abstract = {In this article, Tanya Clement uses the case study of Baroness Elsa von Freytag-Loringhoven{\textquoteright}s unpublished poetry to explore knowledge representation and scholarly editing. Clement begins by describing the nature of Freytag-Loringhoven{\textquoteright}s work and the structure of the digital edition built using TEI and the Versioning Machine. Clement asserts that the theory behind this digital edition comes from John Bryant{\textquoteright}s notion of the fluid text. Clement acknowledges that there are varying opinions on the usefulness of the digital space for creating editions, but that in this case, the medium was superior for representing the poems as versions.},
	keywords = {digital editions, interface development, knowledge representation, scholarly editing, text encoding, versioning},
	issn = {2162-5603},
	doi = {10.4000/jtei.203},
	url = {http://jtei.revues.org/203},
	author = {Clement, Tanya}
}
@conference {don_discovering_2007,
	title = {Discovering Interesting Usage Patterns in Text Collections: Integrating Text Mining with Visualization},
	booktitle = {Proceedings of the Sixteenth ACM Conference on Conference on Information and Knowledge Management},
	series = {{CIKM} {\textquoteright}07},
	year = {2007},
	note = {00107},
	pages = {213{\textendash}222},
	publisher = {ACM},
	organization = {ACM},
	address = {New York, NY, USA},
	abstract = {This article explores the use of computational methods - specifically text mining - for humanities research. The authors begin by arguing that, while humanities scholars use computers to access documents, they rarely use them to assist with literary interoperation or to develop research hypotheses. Text mining is wonderful for identifying patterns and searching through large bodies of text. However, the results it generate are often hard to interpret and, therefore, this method is avoided by humanities researchers. The authors of this article explore the development of a program called FeatureLens to is "designed to fill a gap by allowing users to interpret the results of the text mining thru visual exploration of the patterns in the text." FeatureLens "aims at integrating a set of text mining and visualization functionalities into a powerful tool, which provokes new insights and discoveries." By generating frequent expression lists, frequent work lists, and n-grams, FeatureLens is able to parse complicated text documents and reveal interesting patterns. },
	keywords = {digital humanities, frequent closed itemsets, n-grams, text mining, user interface},
	isbn = {978-1-59593-803-9},
	doi = {10.1145/1321440.1321473},
	url = {http://doi.acm.org/10.1145/1321440.1321473},
	author = {Don, Anthony and Zheleva, Elena and Gregory, Machon and Tarkan, Sureyya and Auvil, Loretta and Clement, Tanya and Shneiderman, Ben and Plaisant, Catherine}
}
